{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 抓取雪球发帖\n",
    "\n",
    "- 作者：DGC'Idea\n",
    "- 版本：V0.1   \n",
    "- 更新日期：2018年4月14日\n",
    "\n",
    "----------\n",
    "\n",
    "- 研究目的：获取微信公众号文章；"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": "数据引擎：运行于研究\n 已准备好！\n"
    }
   ],
   "source": [
    "#引入包\n",
    "import pandas as pd\n",
    "import requests\n",
    "import re\n",
    "import json\n",
    "import time\n",
    "import os\n",
    "\n",
    "\n",
    "# 自定义\n",
    "import sys\n",
    "sys.path.append('../DM')\n",
    "\n",
    "from dm import *\n",
    "from tl import exists_file\n",
    "\n",
    "# 数据目录\n",
    "_data_path='../Data/'\n",
    "# 数据引擎\n",
    "_data=Csv(_data_path)\n",
    "\n",
    "\n",
    "\n",
    "#时间戳转换成日期\n",
    "def timestamp_date(timestamp):\n",
    "    return time.strftime('%Y-%m-%d %H:%M',time.localtime(int(str(timestamp)[0:10])))\n",
    "\n",
    "\n",
    "#读取数据        \n",
    "def read_xueqiu_data(user_id):\n",
    "    #文件名\n",
    "    data_file='xqft_%s.csv'%(user_id)\n",
    "    #从cvs文件恢复数据\n",
    "    df=pd.read_csv(data_file,index_col=0,parse_dates=False)\n",
    "    return df\n",
    "\n",
    "\n",
    "#检测文件      \n",
    "def exists_xueqiu_file(user_id,data_root=_data_path):\n",
    "    #cvs文件名\n",
    "    data_file='%s%s.csv'%(data_root,'msg_xqft_'+user_id)\n",
    "    return exists_file(data_file)\n",
    "\n",
    "\n",
    "#读取数据        \n",
    "def read_xueqiu_data(user_id):\n",
    "    #文件名\n",
    "    data_file='msg_xqft_'+user_id\n",
    "    #从cvs文件恢复数据\n",
    "    df=_data.read(data_file)\n",
    "    return df\n",
    "\n",
    "\n",
    "#保存数据        \n",
    "def save_xueqiu_data(user_id,df):\n",
    "    #文件名\n",
    "    data_file='msg_xqft_'+user_id\n",
    "    #保存到cvs文件\n",
    "    _data.save(data_file,df,append=False)\n",
    "\n",
    "    \n",
    "#性别\n",
    "gender={'m':'男','w':'女'}\n",
    "\n",
    "\n",
    "#雪球网址\n",
    "base_url='https://xueqiu.com'\n",
    "\n",
    "\n",
    "#headers\n",
    "header={\n",
    "    \"HOST\":'xueqiu.com',\n",
    "    'User-Agent':'Mozilla/5.0 (Windows NT 5.1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/53.0.2785.104 \\\n",
    "Safari/537.36 Core/1.53.4620.400 QQBrowser/9.7.13014.400'\n",
    "    }\n",
    "\n",
    "#获取雪球用户信息\n",
    "def get_xueqiu_user(user_id,cookies_str):\n",
    "    #cookies_str转换为字典格式\n",
    "    cookies=get_xueqiu_cookies(cookies_str)  \n",
    "    url='https://xueqiu.com/v4/statuses/user_timeline.json?page=%s&user_id=%s'%(1,user_id)\n",
    "    #获取数据\n",
    "    r=requests.get(url,cookies=cookies,headers=header)\n",
    "    #解析为json\n",
    "    statuses=r.json().get('statuses')[0].get('user')\n",
    "    #获得用户信息\n",
    "    return (statuses.get('screen_name'),#名称\n",
    "            statuses.get('province'),#城市\n",
    "            gender[statuses.get('gender')],#性别\n",
    "            statuses.get('status_count'),#贴子数\n",
    "            statuses.get('stocks_count'),#组合数\n",
    "            statuses.get('friends_count'),#关注数\n",
    "            statuses.get('followers_count'),#粉丝数\n",
    "            statuses.get('description'),)#简介\n",
    "    \n",
    "    \n",
    "#爬取微信公众号文章\n",
    "#user_id：用户识别码\n",
    "#cookies_str：登陆后的cookies字符串，每次登陆后都不一样，所以要手动获取\n",
    "#start：更新的起始位置，用以实现断点续爬和增量更新\n",
    "def get_xueqiu_link(user_id,cookies_str,start_date,first=True,start=0):\n",
    "    #cookies_str转换为字典格式\n",
    "    cookies=get_xueqiu_cookies(cookies_str)  \n",
    "    #数据列表\n",
    "    data_list=[]\n",
    "    #当前页\n",
    "    page=1\n",
    "    #页面总数\n",
    "    maxpage=1\n",
    "    #计数器\n",
    "    count=1\n",
    "    #捕获错误\n",
    "    try:\n",
    "        #遍历所有页\n",
    "        while page<=maxpage:\n",
    "            #url\n",
    "            url='https://xueqiu.com/v4/statuses/user_timeline.json?page=%s&user_id=%s'%(page,user_id)\n",
    "            #获取数据\n",
    "            r=requests.get(url,cookies=cookies,headers=header)\n",
    "#             print (r)\n",
    "            #解析为json\n",
    "            statuses=r.json()\n",
    "            #获得贴子信息\n",
    "            item_list=statuses.get('statuses')\n",
    "            #如果无数据跳出循环\n",
    "            if len(item_list)==0:\n",
    "                break\n",
    "            #如果是首页，获取总页数    \n",
    "            if page==1:\n",
    "                maxpage=int(statuses.get('maxPage')) \n",
    "            #遍历当前页文章列表\n",
    "            for item in item_list:\n",
    "                #剔除置顶贴\n",
    "                if count>1:\n",
    "                    #贴子发表时间\n",
    "                    created_at=timestamp_date(item.get('created_at'))\n",
    "                    #如果是首次获取\n",
    "                    if first==True:\n",
    "                        #获取早于当前时间的所有贴子\n",
    "                        if created_at<start_date :\n",
    "                            #文章链接、标题、时间戳（时间戳转换为日期）\n",
    "                            data_list.append([created_at,item.get('title'),item.get('description'),item.get('text'),\n",
    "                                              base_url+item.get('target'),False])\n",
    "                    #增量获取\n",
    "                    else:\n",
    "                        #获取晚于更新时间的所有贴子\n",
    "                        if created_at>start_date:\n",
    "                             #文章链接、标题、时间戳（时间戳转换为日期）\n",
    "                            data_list.append([created_at,item.get('title'),item.get('description'),item.get('text'),\n",
    "                                              base_url+item.get('target'),False])\n",
    "                        else:\n",
    "                            #超过更新时间，结束\n",
    "                            page=maxpage+1\n",
    "                            break  \n",
    "                print(' 正在检索：%s 篇'%(count),end='\\r')            \n",
    "                #计数            \n",
    "                count+=1    \n",
    "            #页面数递增    \n",
    "            page+=1\n",
    "            #延时，防止被踢\n",
    "            #time.sleep(1)\n",
    "    #打印错误，并忽略        \n",
    "    except Exception as e:\n",
    "        print('错误：%s'%(e))\n",
    "        pass\n",
    "    #没取到数据    \n",
    "    if len(data_list)==0:\n",
    "        return None\n",
    "    else:\n",
    "        #整理数据    \n",
    "        df=pd.DataFrame(data_list,columns=['date','title','description','text','link','sended'])    \n",
    "        #返回数据\n",
    "        return df\n",
    "    \n",
    "    \n",
    "xueqiu_list=[\n",
    "    {\n",
    "    #似乎雪球的cookies可以长期使用，待验证\n",
    "    'cookies':'aliyungf_tc=AQAAAGwSGAyaoQgAUHWuPLg/sqB3ejy4; device_id=dae70533361df97e2a154eb2f1af4151; __utmt=1; remember=1; remember.sig=K4F3faYzmVuqC0iXIERCQf55g2Y; xq_a_token=5654fd39cb89fef36765cc9038bc5b47ad0e62ba; xq_a_token.sig=MZOhC2VaLNqrwpqJk0ONVR8kUMY; xq_r_token=01ee39b512f28c6f395e2d5fc1eeed662ade6a39; xq_r_token.sig=U3jfCcO3T4tjqSenYk1Oevgpufg; xq_is_login=1; xq_is_login.sig=J3LxgPVPUzbBg3Kee_PquUfih7Q; u=6582724674; u.sig=1g3gy3Thq5MyFexbtGy2oMIfDW0; s=e319hj7i0g; bid=14636255fdee238fdda1fc0fe35fbb46_jg4ud6kz; Hm_lvt_1db88642e346389874251b5a1eded6e3=1524040463; Hm_lpvt_1db88642e346389874251b5a1eded6e3=1524040514; __utma=1.585935036.1524040465.1524040465.1524040465.1; __utmb=1.5.10.1524040465; __utmc=1; __utmz=1.1524040465.1.1.utmcsr=sogou.com|utmccn=(referral)|utmcmd=referral|utmcct=/link',\n",
    "    'user_id':'4776750571', \n",
    "    },\n",
    "]        \n",
    "\n",
    "print(' 已准备好！')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 1.设置当前用户"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name 'get_xueqiu_cookies' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-2-18f8bb2f70cf>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[0muser_id\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mxueqiu_list\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'user_id'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      2\u001b[0m \u001b[0mcookies\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mxueqiu_list\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'cookies'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 3\u001b[1;33m \u001b[0muser_info\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mget_xueqiu_user\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0muser_id\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcookies\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      4\u001b[0m \u001b[0muser_name\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0muser_info\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;36m0\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      5\u001b[0m \u001b[0mprint\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m' ID　　'\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0muser_id\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m<ipython-input-1-0a95c1fbf7c0>\u001b[0m in \u001b[0;36mget_xueqiu_user\u001b[1;34m(user_id, cookies_str)\u001b[0m\n\u001b[0;32m     78\u001b[0m \u001b[1;32mdef\u001b[0m \u001b[0mget_xueqiu_user\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0muser_id\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mcookies_str\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     79\u001b[0m     \u001b[1;31m#cookies_str转换为字典格式\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 80\u001b[1;33m     \u001b[0mcookies\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mget_xueqiu_cookies\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mcookies_str\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     81\u001b[0m     \u001b[0murl\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m'https://xueqiu.com/v4/statuses/user_timeline.json?page=%s&user_id=%s'\u001b[0m\u001b[1;33m%\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;36m1\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0muser_id\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     82\u001b[0m     \u001b[1;31m#获取数据\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mNameError\u001b[0m: name 'get_xueqiu_cookies' is not defined"
     ]
    }
   ],
   "source": [
    "user_id=xueqiu_list[0]['user_id'] \n",
    "cookies=xueqiu_list[0]['cookies']\n",
    "user_info=get_xueqiu_user(user_id,cookies)\n",
    "user_name=user_info[0]\n",
    "print(' ID　　',user_id)\n",
    "print(' 名称　',user_info[0])\n",
    "print(' 城市　',user_info[1])\n",
    "print(' 性别　',user_info[2])\n",
    "print(' 帖子　',user_info[3])\n",
    "print(' 组合　',user_info[4])\n",
    "print(' 关注　',user_info[5])\n",
    "print(' 粉丝　',user_info[6])\n",
    "print(' 简介　',user_info[7])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 2.获取贴子"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<Response [200]>\n",
      " 正在检索：1 篇\r",
      "没有新文章或更新不成功！\n"
     ]
    }
   ],
   "source": [
    "# 断点续爬、更新数据\n",
    "#user_id：用户id\n",
    "#cookies：\n",
    "#resume：断点续爬模式\n",
    "def update_xueqiu_data(user_id,cookies,resume=False):\n",
    "    #检查是否已存在数据文件，如存在更新或续爬\n",
    "    if exists_xueqiu_file(user_id):\n",
    "        #读取数据\n",
    "        df=read_xueqiu_data(user_id)\n",
    "        #如果是续爬模式\n",
    "        if resume==True:\n",
    "            #起始位置为最后获取的贴子时间\n",
    "            update_date=df.date.iloc[-1]\n",
    "            new_df=get_xueqiu_link(user_id,cookies,update_date,True) \n",
    "        else:\n",
    "            #起始位置为最新贴子时间\n",
    "            update_date=df.date.iloc[0]\n",
    "            new_df=get_xueqiu_link(user_id,cookies,update_date,False) \n",
    "        if new_df is None:\n",
    "            print('没有新文章或更新不成功！')\n",
    "        else:\n",
    "            if resume==True:\n",
    "                #拼接新、旧数据，顺序不能反\n",
    "                df=pd.concat([df,new_df],ignore_index=True)\n",
    "            else:\n",
    "                #拼接旧、新数据，顺序不能反\n",
    "                df=pd.concat([new_df,df],ignore_index=True) \n",
    "            #保存到cvs文件\n",
    "            save_xueqiu_data(user_id,df)\n",
    "            print(' 共更新：%s 篇文章！'%len(new_df))    \n",
    "    else:\n",
    "        #数据文件不存在，首次获取\n",
    "        update_date=pd.datetime.today().strftime('%Y-%m-%d %H:%M')\n",
    "        df=get_xueqiu_link(user_id,cookies,update_date,True)  \n",
    "        if df is None:\n",
    "            print('获取不成功！')\n",
    "        else:\n",
    "            #保存到cvs文件\n",
    "            save_xueqiu_data(user_id,df)\n",
    "            print(' 共获取：%s 篇文章！'%len(df))\n",
    "    \n",
    "update_xueqiu_data(user_id,cookies,resume=False)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 4.发送邮件"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      " 2018年04月（雪球帖子 ETF拯救世界） 的帖子发送成功！\r"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/opt/conda/lib/python3.4/site-packages/pandas/core/indexing.py:115: SettingWithCopyWarning: \n",
      "A value is trying to be set on a copy of a slice from a DataFrame\n",
      "\n",
      "See the the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy\n",
      "  self._setitem_with_indexer(indexer, value)\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "\n",
    "#引入自定义库\n",
    "sys.path.append(\"/home/jquser/\")\n",
    "from mail import *\n",
    "\n",
    "#发送某月数据\n",
    "def send_xueqiu_data(user_id):\n",
    "    #检查是否已存在数据\n",
    "    if not exists_xueqiu_file(user_id):\n",
    "        print('未找到 %s 的雪球发帖数据表！'%user_id)\n",
    "        return\n",
    "    #读取数据\n",
    "    df=read_xueqiu_data(user_id)\n",
    "    #计算起止年\n",
    "    start_year=int(df.date.iloc[-1][:4])\n",
    "    end_year=int(df.date.iloc[0][:4])+1\n",
    "    #月\n",
    "    m_list=['01','02','03','04','05','06','07','08','09','10','11','12'] \n",
    "    #当前月份\n",
    "    current_month=pd.datetime.today().strftime('%Y-%m')\n",
    "    #已发送标记\n",
    "    issend=False\n",
    "    #遍历年、月\n",
    "    for y in range(start_year,end_year):\n",
    "        for m in m_list:\n",
    "            month=str(y)+'-'+m\n",
    "            #判断是否为当月，当月不发送\n",
    "            if current_month==month:\n",
    "                continue\n",
    "            #按照年月筛选    \n",
    "            temp_df=df[(df.date.str[0:7]==month) & (df.sended==False)]\n",
    "            temp_df=temp_df.sort('date')\n",
    "            if len(temp_df)==0:\n",
    "                continue  \n",
    "            #生成月邮件正文    \n",
    "            message=''\n",
    "            for i in range(len(temp_df)):\n",
    "                #标题（如果有）\n",
    "                if str(temp_df.title.iloc[i])!='nan':\n",
    "                    message+='<h3>%s</h3>'%temp_df.title.iloc[i] \n",
    "                #日期\n",
    "                message+='<p>%s</p>'%temp_df.date.iloc[i]  \n",
    "                #url\n",
    "                message+='<p>%s</p>'%temp_df.link.iloc[i] \n",
    "                #正文    \n",
    "                message+='%s</br></br><hr /></br>'%temp_df.text.iloc[i] \n",
    "            #邮件主题    \n",
    "            subjiect='%s年%s月（雪球帖子 %s）'%(y,m,user_name)\n",
    "            #内容标题\n",
    "            title='<h2>%s</h2></br><hr />'%(subjiect)\n",
    "            #邮件内容\n",
    "            message=title+message\n",
    "            #去除多余的行\n",
    "            message=message.replace('<br/><br/>','').replace('</p></br>','</p>').replace('<p><br/></p>','')\n",
    "            try:\n",
    "                #发送邮件\n",
    "                send_html_qqmail(subjiect,message)\n",
    "                #标记已发送\n",
    "                if len(temp_df)==1:\n",
    "                    df.sended.iloc[temp_df.index[0]]=True\n",
    "                else:\n",
    "                    df.sended.iloc[temp_df.index[-1]:temp_df.index[0]+1]=True\n",
    "                issend=True    \n",
    "                print(' %s 的帖子发送成功！'%(subjiect),end='\\r')\n",
    "                #延时5秒，防止被踢\n",
    "                time.sleep(3)\n",
    "            except:\n",
    "                print(' %s 的帖子发送失败！'%(subjiect),end='\\r')\n",
    "    #如果有发送，则保存            \n",
    "    if issend:\n",
    "        save_xueqiu_data(user_id,df)\n",
    "\n",
    "        \n",
    "send_xueqiu_data(user_id)  "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 5.查看数据表"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>date</th>\n",
       "      <th>title</th>\n",
       "      <th>description</th>\n",
       "      <th>text</th>\n",
       "      <th>link</th>\n",
       "      <th>sended</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2018-04-26 23:57</td>\n",
       "      <td>NaN</td>\n",
       "      <td>再休息三个月。2018的第一次休息。浪费太多时间了。人生苦短，用有限的时间做点有意义的事。八月见。</td>\n",
       "      <td>再休息三个月。2018的第一次休息。&lt;br/&gt;&lt;br/&gt;浪费太多时间了。人生苦短，用有限的时...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106113411</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2018-04-26 16:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/yejiangming\" ta...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/yejiangming\" ta...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106077493</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2018-04-26 16:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>排名一般。</td>\n",
       "      <td>排名一般。</td>\n",
       "      <td>https://xueqiu.com/4776750571/106072614</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>2018-04-26 15:52</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/控计得句计己的狸狸\" targ...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/控计得句计己的狸狸\" targ...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106071401</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>2018-04-26 15:25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/茫然的笨脚大哥\" target...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/茫然的笨脚大哥\" target...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106069090</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>2018-04-26 15:22</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/又见炊烟1999\" targe...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/又见炊烟1999\" targe...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106068871</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>2018-04-26 15:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/Poise\" target=\"...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/Poise\" target=\"...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106068724</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>2018-04-26 14:55</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/乐视坑爹啊\" target=\"...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/乐视坑爹啊\" target=\"...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106065784</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>2018-04-26 14:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>忘了说了。其实，太多人并没有经历过真正的深冬。在他们的世界观里，春夏秋冬其实是不完整的。over。</td>\n",
       "      <td>忘了说了。其实，太多人并没有经历过真正的深冬。在他们的世界观里，春夏秋冬其实是不完整的。over。</td>\n",
       "      <td>https://xueqiu.com/4776750571/106064144</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>2018-04-26 14:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>各位，我表达一下自己的一些想法，不对的请指教。 前几天说过，趋势其实很重要。我们不一定按照趋...</td>\n",
       "      <td>&lt;p&gt;各位，我表达一下自己的一些想法，不对的请指教。&lt;/p&gt;&lt;p&gt;&lt;br/&gt;&lt;/p&gt;&lt;p&gt;前...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106061476</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>2018-04-26 13:59</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/偏好设置\" target=\"_...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/偏好设置\" target=\"_...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106059038</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>2018-04-26 13:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/zy77\" target=\"_...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/zy77\" target=\"_...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106058270</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>2018-04-26 13:29</td>\n",
       "      <td>NaN</td>\n",
       "      <td>保持节奏。保证绝大多数人都死了你还有子弹跟敌人干。</td>\n",
       "      <td>&lt;p&gt;保持节奏。保证绝大多数人都死了你还有子弹跟敌人干。&lt;/p&gt;</td>\n",
       "      <td>https://xueqiu.com/4776750571/106056058</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>2018-04-26 11:58</td>\n",
       "      <td>NaN</td>\n",
       "      <td>确定发车半小时； 写文章一小时； 找音乐半个月。 …… 有骨气，不见不散。</td>\n",
       "      <td>&lt;p&gt;确定发车半小时；&lt;/p&gt;&lt;p&gt;&lt;br/&gt;&lt;/p&gt;&lt;p&gt;写文章一小时；&lt;/p&gt;&lt;p&gt;&lt;b...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106050088</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>2018-04-26 10:37</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106040890</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>2018-04-26 09:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>前天有没有进去的，报个道吧……</td>\n",
       "      <td>前天有没有进去的，报个道吧……</td>\n",
       "      <td>https://xueqiu.com/4776750571/106033387</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>2018-04-26 09:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106031069</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>2018-04-26 09:32</td>\n",
       "      <td>NaN</td>\n",
       "      <td>有个事情我不明白啊，学习好的给讲讲。 经常看到有些大牛股，半年一倍，三年五倍那种。比如从10...</td>\n",
       "      <td>&lt;p&gt;有个事情我不明白啊，学习好的给讲讲。&lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;p&gt;经常看到有些大牛股，半...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106029813</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>2018-04-26 08:25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/LongkerDandy\" t...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/LongkerDandy\" t...</td>\n",
       "      <td>https://xueqiu.com/4776750571/106023693</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>2018-04-25 17:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/随机矩阵\" target=\"_...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/随机矩阵\" target=\"_...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105970908</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>2018-04-25 16:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/gulugulubing\" t...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/gulugulubing\" t...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105966165</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>2018-04-25 15:15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/口水常流\" target=\"_...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/口水常流\" target=\"_...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105958849</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>2018-04-25 14:59</td>\n",
       "      <td>NaN</td>\n",
       "      <td>&lt;a href=\"http://xueqiu.com/S/SH000991\" target=...</td>\n",
       "      <td>&lt;p&gt;&lt;a href=\"http://xueqiu.com/S/SH000991\" targ...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105957331</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>2018-04-24 16:08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>说真的，你现在看纽约油价69，布伦特油价74，还在不停涨。再想想两年前26的时候多少人说以后...</td>\n",
       "      <td>&lt;p&gt;说真的，你现在看纽约油价69，布伦特油价74，还在不停涨。再想想两年前26的时候多少人...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105864583</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>2018-04-24 15:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/不明真相的大韭菜\" targe...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/不明真相的大韭菜\" targe...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105862794</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>2018-04-24 15:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/真_井木犴\" target=\"...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/真_井木犴\" target=\"...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105859863</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>2018-04-24 14:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>我的投资理念啊， 一个是不预测，因为预测不了。水平高点的人，预测正确的次数多点，水平低的人每...</td>\n",
       "      <td>&lt;p&gt;我的投资理念啊，&lt;/p&gt;&lt;p&gt;&lt;br/&gt;&lt;/p&gt;&lt;p&gt;一个是不预测，因为预测不了。水平...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105857568</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>2018-04-24 14:41</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/旅者阿王\" target=\"_...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/旅者阿王\" target=\"_...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105855940</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>2018-04-24 14:27</td>\n",
       "      <td>NaN</td>\n",
       "      <td>以后开车前一周不说话了，请监督。//&lt;a href=\"http://xueqiu.com/n...</td>\n",
       "      <td>以后开车前一周不说话了，请监督。//&lt;a href=\"http://xueqiu.com/n...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105854112</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>2018-04-24 11:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/华宝油气\" target=\"_...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/华宝油气\" target=\"_...</td>\n",
       "      <td>https://xueqiu.com/4776750571/105841614</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1824</th>\n",
       "      <td>2015-04-03 09:25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/旅行者零号\" target=\"...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/旅行者零号\" target=\"...</td>\n",
       "      <td>https://xueqiu.com/4776750571/39694788</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1825</th>\n",
       "      <td>2015-04-02 14:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/三少爷4\" target=\"_...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/三少爷4\" target=\"_...</td>\n",
       "      <td>https://xueqiu.com/4776750571/39619213</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1826</th>\n",
       "      <td>2015-04-02 13:29</td>\n",
       "      <td>A股是个聚宝盆</td>\n",
       "      <td>最近，A股是不是一个“吃人不吐骨头”的市场似乎在雪球引起了不小的争议。在这个市场上，只有10...</td>\n",
       "      <td>最近，A股是不是一个“吃人不吐骨头”的市场似乎在雪球引起了不小的争议。在这个市场上，只有10...</td>\n",
       "      <td>https://xueqiu.com/4776750571/39611266</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1827</th>\n",
       "      <td>2015-03-31 16:29</td>\n",
       "      <td>大风起兮猪飞扬</td>\n",
       "      <td>看图说话：1、全市场pe与深综指对比图：全市场pe已经越过2010年高点，冲向07年最后的高...</td>\n",
       "      <td>看图说话：&lt;br/&gt;&lt;br/&gt;1、全市场pe与深综指对比图：全市场pe已经越过2010年高点...</td>\n",
       "      <td>https://xueqiu.com/4776750571/39421175</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1828</th>\n",
       "      <td>2015-03-26 11:24</td>\n",
       "      <td>NaN</td>\n",
       "      <td>财富，聚集在智商低的人手中是不科学的。这样无法发挥财富的最大效用。所以，这个社会会通过各种方...</td>\n",
       "      <td>财富，聚集在智商低的人手中是不科学的。这样无法发挥财富的最大效用。所以，这个社会会通过各种方...</td>\n",
       "      <td>https://xueqiu.com/4776750571/39002771</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1829</th>\n",
       "      <td>2015-03-25 16:27</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/大冬\" target=\"_bl...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/大冬\" target=\"_bl...</td>\n",
       "      <td>https://xueqiu.com/4776750571/38927951</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1830</th>\n",
       "      <td>2015-03-25 16:14</td>\n",
       "      <td>NaN</td>\n",
       "      <td>四点读后感：1、牛市中一定要战胜指数是个心魔。老巴也做不到，但这并不妨碍他如此成功。2、现金...</td>\n",
       "      <td>四点读后感：&lt;br/&gt;&lt;br/&gt;1、牛市中一定要战胜指数是个心魔。老巴也做不到，但这并不妨碍...</td>\n",
       "      <td>https://xueqiu.com/4776750571/38926736</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1831</th>\n",
       "      <td>2015-03-23 13:23</td>\n",
       "      <td>大牛市好刺激</td>\n",
       "      <td>中午扫了一眼wind金融终端，pe数据有点意思。纯记录一下，日后看一定有趣。有数据的2576...</td>\n",
       "      <td>中午扫了一眼wind金融终端，pe数据有点意思。纯记录一下，日后看一定有趣。&lt;br&gt;&lt;br&gt;...</td>\n",
       "      <td>https://xueqiu.com/4776750571/38705035</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1832</th>\n",
       "      <td>2015-03-05 14:32</td>\n",
       "      <td>NaN</td>\n",
       "      <td>旱则资舟，水则资车，物之理也。论其有余不足，则知贵贱。贵上极则反贱，贱下极则反贵。 贵出如粪...</td>\n",
       "      <td>旱则资舟，水则资车，物之理也。论其有余不足，则知贵贱。贵上极则反贱，贱下极则反贵。&amp;nbsp...</td>\n",
       "      <td>https://xueqiu.com/4776750571/37461774</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1833</th>\n",
       "      <td>2015-03-04 14:47</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/不断重复的愚蠢\" target...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/不断重复的愚蠢\" target...</td>\n",
       "      <td>https://xueqiu.com/4776750571/37379542</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1834</th>\n",
       "      <td>2015-03-04 11:46</td>\n",
       "      <td>剩下的钱你们赚吧</td>\n",
       "      <td>不想说太多，只是说，这一轮的钱我赚够了。剩下的钱，给别人赚。大家都赚才好嘛。今天把仓位降到1...</td>\n",
       "      <td>不想说太多，只是说，这一轮的钱我赚够了。&lt;br&gt;&lt;br&gt;剩下的钱，给别人赚。大家都赚才好嘛。...</td>\n",
       "      <td>https://xueqiu.com/4776750571/37365767</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1835</th>\n",
       "      <td>2015-02-06 14:22</td>\n",
       "      <td>NaN</td>\n",
       "      <td>求教有识之士一个问题：为什么工地上的农民工辛辛苦苦累死累活一个月才挣6000块，还有欠薪风险...</td>\n",
       "      <td>求教有识之士一个问题：&lt;br&gt;&lt;br&gt;为什么工地上的农民工辛辛苦苦累死累活一个月才挣6000...</td>\n",
       "      <td>https://xueqiu.com/4776750571/36351512</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1836</th>\n",
       "      <td>2015-02-03 08:47</td>\n",
       "      <td>NaN</td>\n",
       "      <td>以上都不是最重要的，最重要是下面这段：收割韭菜每年收割的次数，决定于韭菜的长势、施肥情况及市...</td>\n",
       "      <td>以上都不是最重要的，最重要是下面这段：&lt;br/&gt;&lt;br/&gt;收割韭菜每年收割的次数，决定于韭菜...</td>\n",
       "      <td>https://xueqiu.com/4776750571/36164544</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1837</th>\n",
       "      <td>2015-02-02 14:10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>私以为，辛巴这样的说法不妥。其一，“我亏得不比任何一个人少”这句就不合适。据我推断，南铝无非...</td>\n",
       "      <td>私以为，辛巴这样的说法不妥。&lt;br/&gt;&lt;br/&gt;其一，“我亏得不比任何一个人少”这句就不合适...</td>\n",
       "      <td>https://xueqiu.com/4776750571/36127672</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1838</th>\n",
       "      <td>2015-01-03 14:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/最爱月光白\" target=\"...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/最爱月光白\" target=\"...</td>\n",
       "      <td>https://xueqiu.com/4776750571/34773642</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1839</th>\n",
       "      <td>2015-01-02 21:43</td>\n",
       "      <td>2015：ETF投资计划的过去、现在和未来</td>\n",
       "      <td>闲话不多说，进入正题： 壹：现在的市场估值 古语有云：没有数据的论点都是耍流氓。先上数据：图...</td>\n",
       "      <td>闲话不多说，进入正题：&lt;br&gt;&lt;br&gt;&lt;strong&gt;壹：现在的市场估值&lt;br&gt;&lt;br&gt;&lt;b...</td>\n",
       "      <td>https://xueqiu.com/4776750571/34758228</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1840</th>\n",
       "      <td>2014-10-31 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2014-10-31以￥116.15卖出&lt;a href=\"http://xueqiu.com...</td>\n",
       "      <td>2014-10-31以￥116.15卖出&lt;a href=\"http://xueqiu.com...</td>\n",
       "      <td>https://xueqiu.com/4776750571/32609697</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1841</th>\n",
       "      <td>2014-10-21 10:40</td>\n",
       "      <td>NaN</td>\n",
       "      <td>仅仅是简单定投也许会赚钱，但用钱的时候你会发现收益非常非常一般。怎么做？做个组合吧。贴篇旧文...</td>\n",
       "      <td>仅仅是简单定投也许会赚钱，但用钱的时候你会发现收益非常非常一般。&lt;br&gt;&lt;br&gt;怎么做？做个...</td>\n",
       "      <td>https://xueqiu.com/4776750571/32357428</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1842</th>\n",
       "      <td>2014-03-25 09:55</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/davy31\" target=...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/davy31\" target=...</td>\n",
       "      <td>https://xueqiu.com/4776750571/28411365</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1843</th>\n",
       "      <td>2014-03-23 21:45</td>\n",
       "      <td>再说etf资产配置</td>\n",
       "      <td>从大的方面来讲，资产配置的重点，就是把资产合理配置到相关系数很低的各项资产中。相关系数低，也...</td>\n",
       "      <td>从大的方面来讲，资产配置的重点，就是把资产合理配置到相关系数很低的各项资产中。相关系数低，也...</td>\n",
       "      <td>https://xueqiu.com/4776750571/28380907</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1844</th>\n",
       "      <td>2014-03-17 11:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/不明真相的群众\" target...</td>\n",
       "      <td>回复&lt;a href=\"http://xueqiu.com/n/不明真相的群众\" target...</td>\n",
       "      <td>https://xueqiu.com/4776750571/28256633</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1845</th>\n",
       "      <td>2014-03-17 10:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>其实真的特别简单。可是很多人一定不同意。A股挣钱难是因为大多数时间都是高估的。这个时候入场，...</td>\n",
       "      <td>其实真的特别简单。可是很多人一定不同意。&lt;br&gt;&lt;br&gt;A股挣钱难是因为大多数时间都是高估的...</td>\n",
       "      <td>https://xueqiu.com/4776750571/28256189</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1846</th>\n",
       "      <td>2014-03-13 09:10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2008年12月31日，富国银行每股净资产16.02。3个月后，它的股价跌到了7.11。pb...</td>\n",
       "      <td>2008年12月31日，富国银行每股净资产16.02。3个月后，它的股价跌到了7.11。pb...</td>\n",
       "      <td>https://xueqiu.com/4776750571/28192515</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1847</th>\n",
       "      <td>2014-03-12 09:22</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国股市跟成熟股市最大的不同是什么？其实是散户比重过大。这里的散户并不是仅指个人，也包括很大...</td>\n",
       "      <td>中国股市跟成熟股市最大的不同是什么？其实是散户比重过大。这里的散户并不是仅指个人，也包括很大...</td>\n",
       "      <td>https://xueqiu.com/4776750571/28168069</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1848</th>\n",
       "      <td>2014-03-11 09:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>当然不是。很多所谓大盘蓝筹股实际上自由流通股非常小。去掉国家这个大股东的流通股（这部分几乎不...</td>\n",
       "      <td>当然不是。很多所谓大盘蓝筹股实际上自由流通股非常小。&lt;br&gt;去掉国家这个大股东的流通股（这部...</td>\n",
       "      <td>https://xueqiu.com/4776750571/28142712</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1849</th>\n",
       "      <td>2014-01-06 15:30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2014-01-06以￥91.42买入&lt;a href=\"http://xueqiu.com/...</td>\n",
       "      <td>2014-01-06以￥91.42买入&lt;a href=\"http://xueqiu.com/...</td>\n",
       "      <td>https://xueqiu.com/4776750571/26959576</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1850</th>\n",
       "      <td>2013-12-16 13:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2013-12-16以￥95.81买入&lt;a href=\"http://xueqiu.com/...</td>\n",
       "      <td>2013-12-16以￥95.81买入&lt;a href=\"http://xueqiu.com/...</td>\n",
       "      <td>https://xueqiu.com/4776750571/26639988</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1851</th>\n",
       "      <td>2013-10-31 16:30</td>\n",
       "      <td>本月A股市场估值</td>\n",
       "      <td>恰逢季报出尽，又是月底。这次上个全的A股估值图。本月亮点有二：1 国债收益率暴增，过去十年罕...</td>\n",
       "      <td>恰逢季报出尽，又是月底。这次上个全的A股估值图。&lt;br&gt;&lt;br&gt;本月亮点有二：&lt;br&gt;1 国...</td>\n",
       "      <td>https://xueqiu.com/4776750571/25926466</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1852</th>\n",
       "      <td>2013-07-15 09:53</td>\n",
       "      <td>2000点说仓位</td>\n",
       "      <td>本杰明格雷厄姆在上世纪60年代出版的，针对业余投资者的圣经（针对专业投资者的圣经则是《证券分...</td>\n",
       "      <td>本杰明格雷厄姆在上世纪60年代出版的，针对业余投资者的圣经（针对专业投资者的圣经则是《证券分...</td>\n",
       "      <td>https://xueqiu.com/4776750571/24426764</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1853</th>\n",
       "      <td>2012-11-28 11:09</td>\n",
       "      <td>标题</td>\n",
       "      <td>今天，看着不断暴跌的中小板，没有等到15:40 wind上的数据计算结束，我就知道，这是伟大...</td>\n",
       "      <td>今天，看着不断暴跌的中小板，没有等到15:40 wind上的数据计算结束，我就知道，这是伟大...</td>\n",
       "      <td>https://xueqiu.com/4776750571/22523458</td>\n",
       "      <td>True</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1854 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                  date                  title  \\\n",
       "0     2018-04-26 23:57                    NaN   \n",
       "1     2018-04-26 16:51                    NaN   \n",
       "2     2018-04-26 16:04                    NaN   \n",
       "3     2018-04-26 15:52                    NaN   \n",
       "4     2018-04-26 15:25                    NaN   \n",
       "5     2018-04-26 15:22                    NaN   \n",
       "6     2018-04-26 15:20                    NaN   \n",
       "7     2018-04-26 14:55                    NaN   \n",
       "8     2018-04-26 14:42                    NaN   \n",
       "9     2018-04-26 14:20                    NaN   \n",
       "10    2018-04-26 13:59                    NaN   \n",
       "11    2018-04-26 13:50                    NaN   \n",
       "12    2018-04-26 13:29                    NaN   \n",
       "13    2018-04-26 11:58                    NaN   \n",
       "14    2018-04-26 10:37                    NaN   \n",
       "15    2018-04-26 09:51                    NaN   \n",
       "16    2018-04-26 09:38                    NaN   \n",
       "17    2018-04-26 09:32                    NaN   \n",
       "18    2018-04-26 08:25                    NaN   \n",
       "19    2018-04-25 17:38                    NaN   \n",
       "20    2018-04-25 16:39                    NaN   \n",
       "21    2018-04-25 15:15                    NaN   \n",
       "22    2018-04-25 14:59                    NaN   \n",
       "23    2018-04-24 16:08                    NaN   \n",
       "24    2018-04-24 15:49                    NaN   \n",
       "25    2018-04-24 15:16                    NaN   \n",
       "26    2018-04-24 14:54                    NaN   \n",
       "27    2018-04-24 14:41                    NaN   \n",
       "28    2018-04-24 14:27                    NaN   \n",
       "29    2018-04-24 11:38                    NaN   \n",
       "...                ...                    ...   \n",
       "1824  2015-04-03 09:25                    NaN   \n",
       "1825  2015-04-02 14:38                    NaN   \n",
       "1826  2015-04-02 13:29                A股是个聚宝盆   \n",
       "1827  2015-03-31 16:29                大风起兮猪飞扬   \n",
       "1828  2015-03-26 11:24                    NaN   \n",
       "1829  2015-03-25 16:27                    NaN   \n",
       "1830  2015-03-25 16:14                    NaN   \n",
       "1831  2015-03-23 13:23                 大牛市好刺激   \n",
       "1832  2015-03-05 14:32                    NaN   \n",
       "1833  2015-03-04 14:47                    NaN   \n",
       "1834  2015-03-04 11:46               剩下的钱你们赚吧   \n",
       "1835  2015-02-06 14:22                    NaN   \n",
       "1836  2015-02-03 08:47                    NaN   \n",
       "1837  2015-02-02 14:10                    NaN   \n",
       "1838  2015-01-03 14:03                    NaN   \n",
       "1839  2015-01-02 21:43  2015：ETF投资计划的过去、现在和未来   \n",
       "1840  2014-10-31 09:48                    NaN   \n",
       "1841  2014-10-21 10:40                    NaN   \n",
       "1842  2014-03-25 09:55                    NaN   \n",
       "1843  2014-03-23 21:45              再说etf资产配置   \n",
       "1844  2014-03-17 11:09                    NaN   \n",
       "1845  2014-03-17 10:49                    NaN   \n",
       "1846  2014-03-13 09:10                    NaN   \n",
       "1847  2014-03-12 09:22                    NaN   \n",
       "1848  2014-03-11 09:16                    NaN   \n",
       "1849  2014-01-06 15:30                    NaN   \n",
       "1850  2013-12-16 13:48                    NaN   \n",
       "1851  2013-10-31 16:30               本月A股市场估值   \n",
       "1852  2013-07-15 09:53               2000点说仓位   \n",
       "1853  2012-11-28 11:09                     标题   \n",
       "\n",
       "                                            description  \\\n",
       "0     再休息三个月。2018的第一次休息。浪费太多时间了。人生苦短，用有限的时间做点有意义的事。八月见。   \n",
       "1     回复<a href=\"http://xueqiu.com/n/yejiangming\" ta...   \n",
       "2                                                 排名一般。   \n",
       "3     回复<a href=\"http://xueqiu.com/n/控计得句计己的狸狸\" targ...   \n",
       "4     回复<a href=\"http://xueqiu.com/n/茫然的笨脚大哥\" target...   \n",
       "5     回复<a href=\"http://xueqiu.com/n/又见炊烟1999\" targe...   \n",
       "6     回复<a href=\"http://xueqiu.com/n/Poise\" target=\"...   \n",
       "7     回复<a href=\"http://xueqiu.com/n/乐视坑爹啊\" target=\"...   \n",
       "8     忘了说了。其实，太多人并没有经历过真正的深冬。在他们的世界观里，春夏秋冬其实是不完整的。over。   \n",
       "9     各位，我表达一下自己的一些想法，不对的请指教。 前几天说过，趋势其实很重要。我们不一定按照趋...   \n",
       "10    回复<a href=\"http://xueqiu.com/n/偏好设置\" target=\"_...   \n",
       "11    回复<a href=\"http://xueqiu.com/n/zy77\" target=\"_...   \n",
       "12                            保持节奏。保证绝大多数人都死了你还有子弹跟敌人干。   \n",
       "13                确定发车半小时； 写文章一小时； 找音乐半个月。 …… 有骨气，不见不散。   \n",
       "14    回复<a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...   \n",
       "15                                      前天有没有进去的，报个道吧……   \n",
       "16    回复<a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...   \n",
       "17    有个事情我不明白啊，学习好的给讲讲。 经常看到有些大牛股，半年一倍，三年五倍那种。比如从10...   \n",
       "18    回复<a href=\"http://xueqiu.com/n/LongkerDandy\" t...   \n",
       "19    回复<a href=\"http://xueqiu.com/n/随机矩阵\" target=\"_...   \n",
       "20    回复<a href=\"http://xueqiu.com/n/gulugulubing\" t...   \n",
       "21    回复<a href=\"http://xueqiu.com/n/口水常流\" target=\"_...   \n",
       "22    <a href=\"http://xueqiu.com/S/SH000991\" target=...   \n",
       "23    说真的，你现在看纽约油价69，布伦特油价74，还在不停涨。再想想两年前26的时候多少人说以后...   \n",
       "24    回复<a href=\"http://xueqiu.com/n/不明真相的大韭菜\" targe...   \n",
       "25    回复<a href=\"http://xueqiu.com/n/真_井木犴\" target=\"...   \n",
       "26    我的投资理念啊， 一个是不预测，因为预测不了。水平高点的人，预测正确的次数多点，水平低的人每...   \n",
       "27    回复<a href=\"http://xueqiu.com/n/旅者阿王\" target=\"_...   \n",
       "28    以后开车前一周不说话了，请监督。//<a href=\"http://xueqiu.com/n...   \n",
       "29    回复<a href=\"http://xueqiu.com/n/华宝油气\" target=\"_...   \n",
       "...                                                 ...   \n",
       "1824  回复<a href=\"http://xueqiu.com/n/旅行者零号\" target=\"...   \n",
       "1825  回复<a href=\"http://xueqiu.com/n/三少爷4\" target=\"_...   \n",
       "1826  最近，A股是不是一个“吃人不吐骨头”的市场似乎在雪球引起了不小的争议。在这个市场上，只有10...   \n",
       "1827  看图说话：1、全市场pe与深综指对比图：全市场pe已经越过2010年高点，冲向07年最后的高...   \n",
       "1828  财富，聚集在智商低的人手中是不科学的。这样无法发挥财富的最大效用。所以，这个社会会通过各种方...   \n",
       "1829  回复<a href=\"http://xueqiu.com/n/大冬\" target=\"_bl...   \n",
       "1830  四点读后感：1、牛市中一定要战胜指数是个心魔。老巴也做不到，但这并不妨碍他如此成功。2、现金...   \n",
       "1831  中午扫了一眼wind金融终端，pe数据有点意思。纯记录一下，日后看一定有趣。有数据的2576...   \n",
       "1832  旱则资舟，水则资车，物之理也。论其有余不足，则知贵贱。贵上极则反贱，贱下极则反贵。 贵出如粪...   \n",
       "1833  回复<a href=\"http://xueqiu.com/n/不断重复的愚蠢\" target...   \n",
       "1834  不想说太多，只是说，这一轮的钱我赚够了。剩下的钱，给别人赚。大家都赚才好嘛。今天把仓位降到1...   \n",
       "1835  求教有识之士一个问题：为什么工地上的农民工辛辛苦苦累死累活一个月才挣6000块，还有欠薪风险...   \n",
       "1836  以上都不是最重要的，最重要是下面这段：收割韭菜每年收割的次数，决定于韭菜的长势、施肥情况及市...   \n",
       "1837  私以为，辛巴这样的说法不妥。其一，“我亏得不比任何一个人少”这句就不合适。据我推断，南铝无非...   \n",
       "1838  回复<a href=\"http://xueqiu.com/n/最爱月光白\" target=\"...   \n",
       "1839  闲话不多说，进入正题： 壹：现在的市场估值 古语有云：没有数据的论点都是耍流氓。先上数据：图...   \n",
       "1840  2014-10-31以￥116.15卖出<a href=\"http://xueqiu.com...   \n",
       "1841  仅仅是简单定投也许会赚钱，但用钱的时候你会发现收益非常非常一般。怎么做？做个组合吧。贴篇旧文...   \n",
       "1842  回复<a href=\"http://xueqiu.com/n/davy31\" target=...   \n",
       "1843  从大的方面来讲，资产配置的重点，就是把资产合理配置到相关系数很低的各项资产中。相关系数低，也...   \n",
       "1844  回复<a href=\"http://xueqiu.com/n/不明真相的群众\" target...   \n",
       "1845  其实真的特别简单。可是很多人一定不同意。A股挣钱难是因为大多数时间都是高估的。这个时候入场，...   \n",
       "1846  2008年12月31日，富国银行每股净资产16.02。3个月后，它的股价跌到了7.11。pb...   \n",
       "1847  中国股市跟成熟股市最大的不同是什么？其实是散户比重过大。这里的散户并不是仅指个人，也包括很大...   \n",
       "1848  当然不是。很多所谓大盘蓝筹股实际上自由流通股非常小。去掉国家这个大股东的流通股（这部分几乎不...   \n",
       "1849  2014-01-06以￥91.42买入<a href=\"http://xueqiu.com/...   \n",
       "1850  2013-12-16以￥95.81买入<a href=\"http://xueqiu.com/...   \n",
       "1851  恰逢季报出尽，又是月底。这次上个全的A股估值图。本月亮点有二：1 国债收益率暴增，过去十年罕...   \n",
       "1852  本杰明格雷厄姆在上世纪60年代出版的，针对业余投资者的圣经（针对专业投资者的圣经则是《证券分...   \n",
       "1853  今天，看着不断暴跌的中小板，没有等到15:40 wind上的数据计算结束，我就知道，这是伟大...   \n",
       "\n",
       "                                                   text  \\\n",
       "0     再休息三个月。2018的第一次休息。<br/><br/>浪费太多时间了。人生苦短，用有限的时...   \n",
       "1     回复<a href=\"http://xueqiu.com/n/yejiangming\" ta...   \n",
       "2                                                 排名一般。   \n",
       "3     回复<a href=\"http://xueqiu.com/n/控计得句计己的狸狸\" targ...   \n",
       "4     回复<a href=\"http://xueqiu.com/n/茫然的笨脚大哥\" target...   \n",
       "5     回复<a href=\"http://xueqiu.com/n/又见炊烟1999\" targe...   \n",
       "6     回复<a href=\"http://xueqiu.com/n/Poise\" target=\"...   \n",
       "7     回复<a href=\"http://xueqiu.com/n/乐视坑爹啊\" target=\"...   \n",
       "8     忘了说了。其实，太多人并没有经历过真正的深冬。在他们的世界观里，春夏秋冬其实是不完整的。over。   \n",
       "9     <p>各位，我表达一下自己的一些想法，不对的请指教。</p><p><br/></p><p>前...   \n",
       "10    回复<a href=\"http://xueqiu.com/n/偏好设置\" target=\"_...   \n",
       "11    回复<a href=\"http://xueqiu.com/n/zy77\" target=\"_...   \n",
       "12                     <p>保持节奏。保证绝大多数人都死了你还有子弹跟敌人干。</p>   \n",
       "13    <p>确定发车半小时；</p><p><br/></p><p>写文章一小时；</p><p><b...   \n",
       "14    回复<a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...   \n",
       "15                                      前天有没有进去的，报个道吧……   \n",
       "16    回复<a href=\"http://xueqiu.com/n/小毛孩\" target=\"_b...   \n",
       "17    <p>有个事情我不明白啊，学习好的给讲讲。</p><p></p><p>经常看到有些大牛股，半...   \n",
       "18    回复<a href=\"http://xueqiu.com/n/LongkerDandy\" t...   \n",
       "19    回复<a href=\"http://xueqiu.com/n/随机矩阵\" target=\"_...   \n",
       "20    回复<a href=\"http://xueqiu.com/n/gulugulubing\" t...   \n",
       "21    回复<a href=\"http://xueqiu.com/n/口水常流\" target=\"_...   \n",
       "22    <p><a href=\"http://xueqiu.com/S/SH000991\" targ...   \n",
       "23    <p>说真的，你现在看纽约油价69，布伦特油价74，还在不停涨。再想想两年前26的时候多少人...   \n",
       "24    回复<a href=\"http://xueqiu.com/n/不明真相的大韭菜\" targe...   \n",
       "25    回复<a href=\"http://xueqiu.com/n/真_井木犴\" target=\"...   \n",
       "26    <p>我的投资理念啊，</p><p><br/></p><p>一个是不预测，因为预测不了。水平...   \n",
       "27    回复<a href=\"http://xueqiu.com/n/旅者阿王\" target=\"_...   \n",
       "28    以后开车前一周不说话了，请监督。//<a href=\"http://xueqiu.com/n...   \n",
       "29    回复<a href=\"http://xueqiu.com/n/华宝油气\" target=\"_...   \n",
       "...                                                 ...   \n",
       "1824  回复<a href=\"http://xueqiu.com/n/旅行者零号\" target=\"...   \n",
       "1825  回复<a href=\"http://xueqiu.com/n/三少爷4\" target=\"_...   \n",
       "1826  最近，A股是不是一个“吃人不吐骨头”的市场似乎在雪球引起了不小的争议。在这个市场上，只有10...   \n",
       "1827  看图说话：<br/><br/>1、全市场pe与深综指对比图：全市场pe已经越过2010年高点...   \n",
       "1828  财富，聚集在智商低的人手中是不科学的。这样无法发挥财富的最大效用。所以，这个社会会通过各种方...   \n",
       "1829  回复<a href=\"http://xueqiu.com/n/大冬\" target=\"_bl...   \n",
       "1830  四点读后感：<br/><br/>1、牛市中一定要战胜指数是个心魔。老巴也做不到，但这并不妨碍...   \n",
       "1831  中午扫了一眼wind金融终端，pe数据有点意思。纯记录一下，日后看一定有趣。<br><br>...   \n",
       "1832  旱则资舟，水则资车，物之理也。论其有余不足，则知贵贱。贵上极则反贱，贱下极则反贵。&nbsp...   \n",
       "1833  回复<a href=\"http://xueqiu.com/n/不断重复的愚蠢\" target...   \n",
       "1834  不想说太多，只是说，这一轮的钱我赚够了。<br><br>剩下的钱，给别人赚。大家都赚才好嘛。...   \n",
       "1835  求教有识之士一个问题：<br><br>为什么工地上的农民工辛辛苦苦累死累活一个月才挣6000...   \n",
       "1836  以上都不是最重要的，最重要是下面这段：<br/><br/>收割韭菜每年收割的次数，决定于韭菜...   \n",
       "1837  私以为，辛巴这样的说法不妥。<br/><br/>其一，“我亏得不比任何一个人少”这句就不合适...   \n",
       "1838  回复<a href=\"http://xueqiu.com/n/最爱月光白\" target=\"...   \n",
       "1839  闲话不多说，进入正题：<br><br><strong>壹：现在的市场估值<br><br><b...   \n",
       "1840  2014-10-31以￥116.15卖出<a href=\"http://xueqiu.com...   \n",
       "1841  仅仅是简单定投也许会赚钱，但用钱的时候你会发现收益非常非常一般。<br><br>怎么做？做个...   \n",
       "1842  回复<a href=\"http://xueqiu.com/n/davy31\" target=...   \n",
       "1843  从大的方面来讲，资产配置的重点，就是把资产合理配置到相关系数很低的各项资产中。相关系数低，也...   \n",
       "1844  回复<a href=\"http://xueqiu.com/n/不明真相的群众\" target...   \n",
       "1845  其实真的特别简单。可是很多人一定不同意。<br><br>A股挣钱难是因为大多数时间都是高估的...   \n",
       "1846  2008年12月31日，富国银行每股净资产16.02。3个月后，它的股价跌到了7.11。pb...   \n",
       "1847  中国股市跟成熟股市最大的不同是什么？其实是散户比重过大。这里的散户并不是仅指个人，也包括很大...   \n",
       "1848  当然不是。很多所谓大盘蓝筹股实际上自由流通股非常小。<br>去掉国家这个大股东的流通股（这部...   \n",
       "1849  2014-01-06以￥91.42买入<a href=\"http://xueqiu.com/...   \n",
       "1850  2013-12-16以￥95.81买入<a href=\"http://xueqiu.com/...   \n",
       "1851  恰逢季报出尽，又是月底。这次上个全的A股估值图。<br><br>本月亮点有二：<br>1 国...   \n",
       "1852  本杰明格雷厄姆在上世纪60年代出版的，针对业余投资者的圣经（针对专业投资者的圣经则是《证券分...   \n",
       "1853  今天，看着不断暴跌的中小板，没有等到15:40 wind上的数据计算结束，我就知道，这是伟大...   \n",
       "\n",
       "                                         link sended  \n",
       "0     https://xueqiu.com/4776750571/106113411   True  \n",
       "1     https://xueqiu.com/4776750571/106077493   True  \n",
       "2     https://xueqiu.com/4776750571/106072614   True  \n",
       "3     https://xueqiu.com/4776750571/106071401   True  \n",
       "4     https://xueqiu.com/4776750571/106069090   True  \n",
       "5     https://xueqiu.com/4776750571/106068871   True  \n",
       "6     https://xueqiu.com/4776750571/106068724   True  \n",
       "7     https://xueqiu.com/4776750571/106065784   True  \n",
       "8     https://xueqiu.com/4776750571/106064144   True  \n",
       "9     https://xueqiu.com/4776750571/106061476   True  \n",
       "10    https://xueqiu.com/4776750571/106059038   True  \n",
       "11    https://xueqiu.com/4776750571/106058270   True  \n",
       "12    https://xueqiu.com/4776750571/106056058   True  \n",
       "13    https://xueqiu.com/4776750571/106050088   True  \n",
       "14    https://xueqiu.com/4776750571/106040890   True  \n",
       "15    https://xueqiu.com/4776750571/106033387   True  \n",
       "16    https://xueqiu.com/4776750571/106031069   True  \n",
       "17    https://xueqiu.com/4776750571/106029813   True  \n",
       "18    https://xueqiu.com/4776750571/106023693   True  \n",
       "19    https://xueqiu.com/4776750571/105970908   True  \n",
       "20    https://xueqiu.com/4776750571/105966165   True  \n",
       "21    https://xueqiu.com/4776750571/105958849   True  \n",
       "22    https://xueqiu.com/4776750571/105957331   True  \n",
       "23    https://xueqiu.com/4776750571/105864583   True  \n",
       "24    https://xueqiu.com/4776750571/105862794   True  \n",
       "25    https://xueqiu.com/4776750571/105859863   True  \n",
       "26    https://xueqiu.com/4776750571/105857568   True  \n",
       "27    https://xueqiu.com/4776750571/105855940   True  \n",
       "28    https://xueqiu.com/4776750571/105854112   True  \n",
       "29    https://xueqiu.com/4776750571/105841614   True  \n",
       "...                                       ...    ...  \n",
       "1824   https://xueqiu.com/4776750571/39694788   True  \n",
       "1825   https://xueqiu.com/4776750571/39619213   True  \n",
       "1826   https://xueqiu.com/4776750571/39611266   True  \n",
       "1827   https://xueqiu.com/4776750571/39421175   True  \n",
       "1828   https://xueqiu.com/4776750571/39002771   True  \n",
       "1829   https://xueqiu.com/4776750571/38927951   True  \n",
       "1830   https://xueqiu.com/4776750571/38926736   True  \n",
       "1831   https://xueqiu.com/4776750571/38705035   True  \n",
       "1832   https://xueqiu.com/4776750571/37461774   True  \n",
       "1833   https://xueqiu.com/4776750571/37379542   True  \n",
       "1834   https://xueqiu.com/4776750571/37365767   True  \n",
       "1835   https://xueqiu.com/4776750571/36351512   True  \n",
       "1836   https://xueqiu.com/4776750571/36164544   True  \n",
       "1837   https://xueqiu.com/4776750571/36127672   True  \n",
       "1838   https://xueqiu.com/4776750571/34773642   True  \n",
       "1839   https://xueqiu.com/4776750571/34758228   True  \n",
       "1840   https://xueqiu.com/4776750571/32609697   True  \n",
       "1841   https://xueqiu.com/4776750571/32357428   True  \n",
       "1842   https://xueqiu.com/4776750571/28411365   True  \n",
       "1843   https://xueqiu.com/4776750571/28380907   True  \n",
       "1844   https://xueqiu.com/4776750571/28256633   True  \n",
       "1845   https://xueqiu.com/4776750571/28256189   True  \n",
       "1846   https://xueqiu.com/4776750571/28192515   True  \n",
       "1847   https://xueqiu.com/4776750571/28168069   True  \n",
       "1848   https://xueqiu.com/4776750571/28142712   True  \n",
       "1849   https://xueqiu.com/4776750571/26959576   True  \n",
       "1850   https://xueqiu.com/4776750571/26639988   True  \n",
       "1851   https://xueqiu.com/4776750571/25926466   True  \n",
       "1852   https://xueqiu.com/4776750571/24426764   True  \n",
       "1853   https://xueqiu.com/4776750571/22523458   True  \n",
       "\n",
       "[1854 rows x 6 columns]"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df=read_xueqiu_data(user_id)\n",
    "# df['sended']=False\n",
    "# save_xueqiu_data(user_id,df)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4-final"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}